from transformers import AutoTokenizer

tok7b = AutoTokenizer.from_pretrained("/mnt/ssd/jsj/models/models/Qwen/Qwen2.5-7B-Instruct")
tok05b = AutoTokenizer.from_pretrained("/mnt/ssd/jsj/models/models/Qwen/Qwen2.5-0.5B-Instruct")

print("7B vocab:", len(tok7b))
print("0.5B vocab:", len(tok05b))
